{
 "cells": [
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "# 期末-猎聘\n",
    "* 方法介绍\n",
    "  * 使用 requests-html 爬取并存取网页文字档，查找[requests-html 中文文档](https://cncert.github.io/requests-html-doc-cn/#/)\n",
    "  * [xpath 语法](https://www.w3cschool.cn/xpath/xpath-syntax.html)丶[xpath 节点](https://www.w3cschool.cn/xpath/xpath-nodes.html)\n",
    "  *  拆解带有参数的URL，并再从query取出参数\n",
    "    * URL拆解: 使用[urllib.parse](https://docs.python.org/3/library/urllib.parse.html)解析出(query)[https://blog.csdn.net/thc1987/article/details/79347054]\n",
    "    * query拆解: 取出参数 成python字典\n",
    "  * 有基底URL，加上参数字典，请求新网页连续技\n",
    "  * 使用[pandas.DataFrame](https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.html)进行数据整理以及分析\n",
    "    * 数据导出\n",
    "    \n",
    "    ``` csv = pd.to_csv(\"路径文档名\",encoding=\"utf8\")\n",
    "    tsv = pd.to_csv(\"路径文档名\"，encoding=\"utf8\",sep=\"\\t\")，注意csv\n",
    "    excel = pd.to_excel(\"路径文档名\"，sheet_name=\"分页名称\")\n",
    "    ```"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 基本模块\n",
    "import pandas as pd\n",
    "from requests_html import HTMLSession\n",
    "from urllib.parse import urlparse, parse_qs"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 行业参数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "{'互联网/电商': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_01&jobKind=&industries=040&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '游戏产业': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_01&jobKind=&industries=420&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '计算机软件': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_01&jobKind=&industries=010&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " 'IT服务': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_01&jobKind=&industries=030&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '电子/芯片/半导体': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_02&jobKind=&industries=050&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '通信业': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_02&jobKind=&industries=060&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '计算机/网络设备': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_02&jobKind=&industries=020&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '房地产/建筑': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_03&jobKind=&industries=080&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '规划/设计/装潢': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_03&jobKind=&industries=100&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '房地产服务': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_03&jobKind=&industries=090&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '银行': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_04&jobKind=&industries=130&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '保险': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_04&jobKind=&industries=140&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '基金/证券/投资': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_04&jobKind=&industries=150&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '会计/审计': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_04&jobKind=&industries=430&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '信托/担保/拍卖': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_04&jobKind=&industries=500&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '快消品': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_05&jobKind=&industries=190&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '批发零售': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_05&jobKind=&industries=240&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '服装纺织': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_05&jobKind=&industries=200&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '家具/家电': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_05&jobKind=&industries=210&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '办公设备': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_05&jobKind=&industries=220&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '奢侈品/收藏品': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_05&jobKind=&industries=460&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '珠宝/玩具/工艺品': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_05&jobKind=&industries=470&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '汽车/摩托车': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_06&jobKind=&industries=350&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '机械/机电/重工': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_06&jobKind=&industries=360&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '印刷/包装/造纸': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_06&jobKind=&industries=180&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '原材料加工': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_06&jobKind=&industries=370&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '仪器/电气/自动化': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_06&jobKind=&industries=340&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '制药/生物工程': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_10&jobKind=&industries=270&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '医疗/保健/美容': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_10&jobKind=&industries=280&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '医疗器械': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_10&jobKind=&industries=290&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '能源/水利': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_11&jobKind=&industries=330&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '石油/化工': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_11&jobKind=&industries=310&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '采掘/冶炼/矿产': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_11&jobKind=&industries=320&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '环保': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_11&jobKind=&industries=300&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '新能源': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_11&jobKind=&industries=490&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '专业服务': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_07&jobKind=&industries=120&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '中介服务': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_07&jobKind=&industries=110&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '外包服务': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_07&jobKind=&industries=440&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '检测/认证': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_07&jobKind=&industries=450&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '餐饮/酒旅/服务': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_07&jobKind=&industries=230&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '文体娱乐': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_07&jobKind=&industries=260&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '租赁服务': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_07&jobKind=&industries=510&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '广告/市场/会展': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_08&jobKind=&industries=070&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '影视文化': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_08&jobKind=&industries=170&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '教育培训': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_08&jobKind=&industries=380&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '交通/物流/运输': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_09&jobKind=&industries=250&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '贸易/进出口': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_09&jobKind=&industries=160&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '航空/航天': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_09&jobKind=&industries=480&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '政务/公共服务': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_12&jobKind=&industries=390&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '农林牧渔': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_12&jobKind=&industries=410&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944',\n",
       " '其他行业': '/zhaopin/?flushckid=1&compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=&compIds=&subIndustry=&industryType=industry_12&jobKind=&industries=400&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944'}"
      ]
     },
     "execution_count": 51,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "url = \"https://www.liepin.com/zhaopin/?key=PRD\"\n",
    "session = HTMLSession()\n",
    "r = session.get( url )\n",
    "\n",
    "行业数据选择器链结 = r.html.xpath('//ul[@class=\"clearfix\"]/li/div/a')\n",
    "行业数据选择器链结\n",
    "\n",
    "# 爬起行业数据链接的文字以及链接\n",
    "行业数据选择器链结 = { x.xpath(\"a/text()\")[0]:x.xpath(\"a/@href\")[0] for x in 行业数据选择器链结}#注意\"\"\n",
    "行业数据选择器链结"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 分析行业参数的关键参数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "<class 'pandas.core.frame.DataFrame'>\n",
      "RangeIndex: 51 entries, 0 to 50\n",
      "Data columns (total 6 columns):\n",
      " #   Column    Non-Null Count  Dtype \n",
      "---  ------    --------------  ----- \n",
      " 0   scheme    51 non-null     object\n",
      " 1   netloc    51 non-null     object\n",
      " 2   path      51 non-null     object\n",
      " 3   params    51 non-null     object\n",
      " 4   query     51 non-null     object\n",
      " 5   fragment  51 non-null     object\n",
      "dtypes: object(6)\n",
      "memory usage: 2.5+ KB\n",
      "scheme       1\n",
      "netloc       1\n",
      "path         1\n",
      "params       1\n",
      "query       51\n",
      "fragment     1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>scheme</th>\n",
       "      <th>netloc</th>\n",
       "      <th>path</th>\n",
       "      <th>params</th>\n",
       "      <th>query</th>\n",
       "      <th>fragment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>flushckid=1&amp;compkind=&amp;dqs=&amp;pubTime=&amp;pageSize=4...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  scheme netloc       path params  \\\n",
       "0                /zhaopin/          \n",
       "\n",
       "                                               query fragment  \n",
       "0  flushckid=1&compkind=&dqs=&pubTime=&pageSize=4...           "
      ]
     },
     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# urlparsee返回的6个部分，分别是：scheme(机制)丶netloc(网络位置)丶path(路径)丶params(路径段参数)丶query(查询)丶fragment(片段)。\n",
    "df = pd.DataFrame([ urlparse(x) for x in 行业数据选择器链结.values()])\n",
    "df.info()\n",
    "print(df.nunique())\n",
    "df.head(1)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "flushckid        1\n",
      "pageSize         1\n",
      "industryType    12\n",
      "industries      51\n",
      "key              1\n",
      "siTag            1\n",
      "d_sfrom          1\n",
      "d_ckId           1\n",
      "d_curPage        1\n",
      "d_pageSize       1\n",
      "d_headId         1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>flushckid</th>\n",
       "      <th>pageSize</th>\n",
       "      <th>industryType</th>\n",
       "      <th>industries</th>\n",
       "      <th>key</th>\n",
       "      <th>siTag</th>\n",
       "      <th>d_sfrom</th>\n",
       "      <th>d_ckId</th>\n",
       "      <th>d_curPage</th>\n",
       "      <th>d_pageSize</th>\n",
       "      <th>d_headId</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>40</td>\n",
       "      <td>industry_01</td>\n",
       "      <td>040</td>\n",
       "      <td>PRD</td>\n",
       "      <td>5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>40</td>\n",
       "      <td>industry_01</td>\n",
       "      <td>420</td>\n",
       "      <td>PRD</td>\n",
       "      <td>5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>1</td>\n",
       "      <td>40</td>\n",
       "      <td>industry_01</td>\n",
       "      <td>010</td>\n",
       "      <td>PRD</td>\n",
       "      <td>5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>1</td>\n",
       "      <td>40</td>\n",
       "      <td>industry_01</td>\n",
       "      <td>030</td>\n",
       "      <td>PRD</td>\n",
       "      <td>5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>1</td>\n",
       "      <td>40</td>\n",
       "      <td>industry_02</td>\n",
       "      <td>050</td>\n",
       "      <td>PRD</td>\n",
       "      <td>5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>6c380aff9cf115badbb09e8f85eac07c</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  flushckid pageSize industryType industries  key  \\\n",
       "0         1       40  industry_01        040  PRD   \n",
       "1         1       40  industry_01        420  PRD   \n",
       "2         1       40  industry_01        010  PRD   \n",
       "3         1       40  industry_01        030  PRD   \n",
       "4         1       40  industry_02        050  PRD   \n",
       "\n",
       "                                           siTag         d_sfrom  \\\n",
       "0  5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw  search_unknown   \n",
       "1  5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw  search_unknown   \n",
       "2  5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw  search_unknown   \n",
       "3  5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw  search_unknown   \n",
       "4  5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw  search_unknown   \n",
       "\n",
       "                             d_ckId d_curPage d_pageSize  \\\n",
       "0  6c380aff9cf115badbb09e8f85eac07c         0         40   \n",
       "1  6c380aff9cf115badbb09e8f85eac07c         0         40   \n",
       "2  6c380aff9cf115badbb09e8f85eac07c         0         40   \n",
       "3  6c380aff9cf115badbb09e8f85eac07c         0         40   \n",
       "4  6c380aff9cf115badbb09e8f85eac07c         0         40   \n",
       "\n",
       "                           d_headId  \n",
       "0  6c380aff9cf115badbb09e8f85eac07c  \n",
       "1  6c380aff9cf115badbb09e8f85eac07c  \n",
       "2  6c380aff9cf115badbb09e8f85eac07c  \n",
       "3  6c380aff9cf115badbb09e8f85eac07c  \n",
       "4  6c380aff9cf115badbb09e8f85eac07c  "
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 针对query 再解析\n",
    "# df_qs = pd.DataFrame([ parse_qs(x) for x in df['query'] ])\n",
    "# parse_qs返回query(查询)多个部分\n",
    "\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "print (df_qs.nunique())\n",
    "df_qs.head()\n"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "* 找寻到关键参数--industryType、industries   "
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 建构行业参数模板"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['040'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c']}\n",
      "{'互联网/电商': '040', '游戏产业': '420', '计算机软件': '010', 'IT服务': '030', '电子/芯片/半导体': '050', '通信业': '060', '计算机/网络设备': '020', '房地产/建筑': '080', '规划/设计/装潢': '100', '房地产服务': '090', '银行': '130', '保险': '140', '基金/证券/投资': '150', '会计/审计': '430', '信托/担保/拍卖': '500', '快消品': '190', '批发零售': '240', '服装纺织': '200', '家具/家电': '210', '办公设备': '220', '奢侈品/收藏品': '460', '珠宝/玩具/工艺品': '470', '汽车/摩托车': '350', '机械/机电/重工': '360', '印刷/包装/造纸': '180', '原材料加工': '370', '仪器/电气/自动化': '340', '制药/生物工程': '270', '医疗/保健/美容': '280', '医疗器械': '290', '能源/水利': '330', '石油/化工': '310', '采掘/冶炼/矿产': '320', '环保': '300', '新能源': '490', '专业服务': '120', '中介服务': '110', '外包服务': '440', '检测/认证': '450', '餐饮/酒旅/服务': '230', '文体娱乐': '260', '租赁服务': '510', '广告/市场/会展': '070', '影视文化': '170', '教育培训': '380', '交通/物流/运输': '250', '贸易/进出口': '160', '航空/航天': '480', '政务/公共服务': '390', '农林牧渔': '410', '其他行业': '400'}\n"
     ]
    }
   ],
   "source": [
    "def parse_url_qs_for_industries (url):\n",
    "    six_parts = urlparse(url) \n",
    "    out = parse_qs(six_parts.query)\n",
    "    return (out)\n",
    "\n",
    "# parse_url_qs_for_compTag(list(公司数据选择器链结.values())[0])['compTag']\n",
    "参数模板 = parse_url_qs_for_industries(list(行业数据选择器链结.values())[0])\n",
    "print(参数模板)\n",
    "\n",
    "[ parse_url_qs_for_industries(x)['industries'][0] for x in 行业数据选择器链结.values()]\n",
    "\n",
    "字典_industries = { k:parse_url_qs_for_industries(v)['industries'][0] for k,v in 行业数据选择器链结.items()}\n",
    "print (字典_industries)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'互联网/电商': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['040'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '游戏产业': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['420'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '计算机软件': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['010'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, 'IT服务': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['030'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '电子/芯片/半导体': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['050'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '通信业': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['060'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '计算机/网络设备': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['020'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '房地产/建筑': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['080'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '规划/设计/装潢': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['100'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '房地产服务': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['090'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '银行': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['130'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '保险': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['140'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '基金/证券/投资': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['150'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '会计/审计': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['430'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '信托/担保/拍卖': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['500'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '快消品': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['190'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '批发零售': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['240'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '服装纺织': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['200'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '家具/家电': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['210'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '办公设备': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['220'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '奢侈品/收藏品': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['460'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '珠宝/玩具/工艺品': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['470'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '汽车/摩托车': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['350'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '机械/机电/重工': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['360'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '印刷/包装/造纸': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['180'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '原材料加工': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['370'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '仪器/电气/自动化': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['340'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '制药/生物工程': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['270'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '医疗/保健/美容': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['280'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '医疗器械': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['290'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '能源/水利': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['330'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '石油/化工': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['310'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '采掘/冶炼/矿产': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['320'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '环保': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['300'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '新能源': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['490'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '专业服务': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['120'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '中介服务': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['110'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '外包服务': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['440'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '检测/认证': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['450'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '餐饮/酒旅/服务': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['230'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '文体娱乐': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['260'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '租赁服务': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['510'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '广告/市场/会展': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['070'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '影视文化': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['170'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '教育培训': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['380'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '交通/物流/运输': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['250'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '贸易/进出口': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['160'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '航空/航天': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['480'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '政务/公共服务': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['390'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '农林牧渔': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['410'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}, '其他行业': {'flushckid': ['1'], 'pageSize': ['40'], 'industryType': ['industry_01'], 'industries': ['400'], 'key': ['PRD'], 'siTag': ['5pAulR6ffRIsqTOD3tZ_8w~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['6c380aff9cf115badbb09e8f85eac07c'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['6c380aff9cf115badbb09e8f85eac07c'], 'keyword': ['产品经理']}}\n"
     ]
    }
   ],
   "source": [
    "def 参数模板生成(industries, keyword ):\n",
    "    参数 = 参数模板.copy()\n",
    "    参数['industries'] = industries\n",
    "    参数['keyword'] = keyword\n",
    "    return (参数)\n",
    "\n",
    "参数_industries_产品经理 = { k:参数模板生成(industries = [v], keyword = ['产品经理']) for k,v in 字典_industries.items()}\n",
    "print(参数_industries_产品经理)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 翻页参数"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [],
   "source": [
    "# A-0   单一页面\n",
    "url = \"https://www.liepin.com/zhaopin/?keyword=PRD\"\n",
    "session = HTMLSession()\n",
    "r = session.get( url )"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "[<Element 'a' href='/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=1'>, <Element 'a' href='/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=2'>, <Element 'a' href='/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=3'>, <Element 'a' href='/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=4'>, <Element 'a' href='/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=1'>, <Element 'a' class=('last',) href='/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=9' title='末页'>]\n",
      "{'2': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=1', '3': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=2', '4': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=3', '5': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=4', '下一页': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=1', '': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=PRD&siTag=5pAulR6ffRIsqTOD3tZ_8w%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=7c661900e11d453dcc2739a7644ff944&d_curPage=0&d_pageSize=40&d_headId=7c661900e11d453dcc2739a7644ff944&curPage=9'}\n"
     ]
    }
   ],
   "source": [
    "# A-1  xpath 解析翻页a/@href\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a' # 有disabled, current等href是javascript\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "print (r.html.xpath(xpath_翻页a)) # 物件\n",
    "\n",
    "href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "#print (href_列表)\n",
    "\n",
    "文字_列表 = [x.text for x in r.html.xpath(xpath_翻页a)]\n",
    "#print (文字_列表)\n",
    "\n",
    "href_字典 = {x.text:x.xpath('//@href')[0]  for x in r.html.xpath(xpath_翻页a)}\n",
    "print (href_字典)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 分析链接翻页链接，找到关键参数及参数结构"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>scheme</th>\n",
       "      <th>netloc</th>\n",
       "      <th>path</th>\n",
       "      <th>params</th>\n",
       "      <th>query</th>\n",
       "      <th>fragment</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>compkind=&amp;dqs=&amp;pubTime=&amp;pageSize=40&amp;salary=&amp;co...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>compkind=&amp;dqs=&amp;pubTime=&amp;pageSize=40&amp;salary=&amp;co...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>compkind=&amp;dqs=&amp;pubTime=&amp;pageSize=40&amp;salary=&amp;co...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>compkind=&amp;dqs=&amp;pubTime=&amp;pageSize=40&amp;salary=&amp;co...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>compkind=&amp;dqs=&amp;pubTime=&amp;pageSize=40&amp;salary=&amp;co...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td></td>\n",
       "      <td></td>\n",
       "      <td>/zhaopin/</td>\n",
       "      <td></td>\n",
       "      <td>compkind=&amp;dqs=&amp;pubTime=&amp;pageSize=40&amp;salary=&amp;co...</td>\n",
       "      <td></td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  scheme netloc       path params  \\\n",
       "0                /zhaopin/          \n",
       "1                /zhaopin/          \n",
       "2                /zhaopin/          \n",
       "3                /zhaopin/          \n",
       "4                /zhaopin/          \n",
       "5                /zhaopin/          \n",
       "\n",
       "                                               query fragment  \n",
       "0  compkind=&dqs=&pubTime=&pageSize=40&salary=&co...           \n",
       "1  compkind=&dqs=&pubTime=&pageSize=40&salary=&co...           \n",
       "2  compkind=&dqs=&pubTime=&pageSize=40&salary=&co...           \n",
       "3  compkind=&dqs=&pubTime=&pageSize=40&salary=&co...           \n",
       "4  compkind=&dqs=&pubTime=&pageSize=40&salary=&co...           \n",
       "5  compkind=&dqs=&pubTime=&pageSize=40&salary=&co...           "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "scheme      1\n",
      "netloc      1\n",
      "path        1\n",
      "params      1\n",
      "query       5\n",
      "fragment    1\n",
      "dtype: int64\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>pageSize</th>\n",
       "      <th>sortFlag</th>\n",
       "      <th>siTag</th>\n",
       "      <th>d_sfrom</th>\n",
       "      <th>d_ckId</th>\n",
       "      <th>d_curPage</th>\n",
       "      <th>d_pageSize</th>\n",
       "      <th>d_headId</th>\n",
       "      <th>curPage</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>40</td>\n",
       "      <td>°radeFlag=0</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>40</td>\n",
       "      <td>°radeFlag=0</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>40</td>\n",
       "      <td>°radeFlag=0</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>40</td>\n",
       "      <td>°radeFlag=0</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>40</td>\n",
       "      <td>°radeFlag=0</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>40</td>\n",
       "      <td>°radeFlag=0</td>\n",
       "      <td>1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw</td>\n",
       "      <td>search_unknown</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>0</td>\n",
       "      <td>40</td>\n",
       "      <td>f687b5e8f73707274eb9452147370d58</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "  pageSize     sortFlag                                          siTag  \\\n",
       "0       40  °radeFlag=0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw   \n",
       "1       40  °radeFlag=0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw   \n",
       "2       40  °radeFlag=0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw   \n",
       "3       40  °radeFlag=0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw   \n",
       "4       40  °radeFlag=0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw   \n",
       "5       40  °radeFlag=0  1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw   \n",
       "\n",
       "          d_sfrom                            d_ckId d_curPage d_pageSize  \\\n",
       "0  search_unknown  f687b5e8f73707274eb9452147370d58         0         40   \n",
       "1  search_unknown  f687b5e8f73707274eb9452147370d58         0         40   \n",
       "2  search_unknown  f687b5e8f73707274eb9452147370d58         0         40   \n",
       "3  search_unknown  f687b5e8f73707274eb9452147370d58         0         40   \n",
       "4  search_unknown  f687b5e8f73707274eb9452147370d58         0         40   \n",
       "5  search_unknown  f687b5e8f73707274eb9452147370d58         0         40   \n",
       "\n",
       "                           d_headId curPage  \n",
       "0  f687b5e8f73707274eb9452147370d58       1  \n",
       "1  f687b5e8f73707274eb9452147370d58       2  \n",
       "2  f687b5e8f73707274eb9452147370d58       3  \n",
       "3  f687b5e8f73707274eb9452147370d58       4  \n",
       "4  f687b5e8f73707274eb9452147370d58       1  \n",
       "5  f687b5e8f73707274eb9452147370d58       9  "
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "pageSize      1\n",
      "sortFlag      1\n",
      "siTag         1\n",
      "d_sfrom       1\n",
      "d_ckId        1\n",
      "d_curPage     1\n",
      "d_pageSize    1\n",
      "d_headId      1\n",
      "curPage       5\n",
      "dtype: int64\n"
     ]
    }
   ],
   "source": [
    "# 需要模组库\n",
    "from urllib.parse import urlparse, parse_qs\n",
    "import pandas as pd\n",
    "from IPython.display import display, HTML\n",
    "\n",
    "# 输入 href_列表, 建构出参数字典\n",
    "\n",
    "# urlparse 解析后丢入数据框\n",
    "df = pd.DataFrame([ urlparse(x) for x in href_列表])\n",
    "df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "\n",
    "display(df)\n",
    "print(df.nunique())\n",
    "display(df_qs)\n",
    "print(df_qs.nunique())\n",
    "\n",
    "df_qs.curPage\n",
    "df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 建构翻页参数模板"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "{'pageSize': ['40'], 'sortFlag': ['°radeFlag=0'], 'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'], 'd_sfrom': ['search_unknown'], 'd_ckId': ['f687b5e8f73707274eb9452147370d58'], 'd_curPage': ['0'], 'd_pageSize': ['40'], 'd_headId': ['f687b5e8f73707274eb9452147370d58'], 'curPage': ['1']}\n",
      "{'2': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f687b5e8f73707274eb9452147370d58&d_curPage=0&d_pageSize=40&d_headId=f687b5e8f73707274eb9452147370d58&curPage=1', '3': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f687b5e8f73707274eb9452147370d58&d_curPage=0&d_pageSize=40&d_headId=f687b5e8f73707274eb9452147370d58&curPage=2', '4': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f687b5e8f73707274eb9452147370d58&d_curPage=0&d_pageSize=40&d_headId=f687b5e8f73707274eb9452147370d58&curPage=3', '5': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f687b5e8f73707274eb9452147370d58&d_curPage=0&d_pageSize=40&d_headId=f687b5e8f73707274eb9452147370d58&curPage=4', '下一页': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f687b5e8f73707274eb9452147370d58&d_curPage=0&d_pageSize=40&d_headId=f687b5e8f73707274eb9452147370d58&curPage=1', '': '/zhaopin/?compkind=&dqs=&pubTime=&pageSize=40&salary=&compTag=&sortFlag=°radeFlag=0&compIds=&subIndustry=&jobKind=&industries=&compscale=&key=&siTag=1B2M2Y8AsgTpgAmY7PhCfg%7EfA9rXquZc5IkJpXC-Ycixw&d_sfrom=search_unknown&d_ckId=f687b5e8f73707274eb9452147370d58&d_curPage=0&d_pageSize=40&d_headId=f687b5e8f73707274eb9452147370d58&curPage=9'}\n"
     ]
    }
   ],
   "source": [
    "# 建构参数模板：找到关键参数及参数结构\n",
    "\n",
    "def parse_url_qs_for_curPage (url):\n",
    "    six_parts = urlparse(url) \n",
    "    out = parse_qs(six_parts.query)\n",
    "    return (out)\n",
    "\n",
    "# 取一例做模板\n",
    "参数模板 = parse_url_qs_for_curPage(href_列表[0])\n",
    "print (参数模板)\n",
    "\n",
    "print (href_字典)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\n",
      "9\n"
     ]
    },
    {
     "data": {
      "text/plain": [
       "{0: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [0],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 1: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [1],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 2: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [2],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 3: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [3],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 4: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [4],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 5: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [5],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 6: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [6],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 7: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [7],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 8: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [8],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']},\n",
       " 9: {'pageSize': ['40'],\n",
       "  'sortFlag': ['°radeFlag=0'],\n",
       "  'siTag': ['1B2M2Y8AsgTpgAmY7PhCfg~fA9rXquZc5IkJpXC-Ycixw'],\n",
       "  'd_sfrom': ['search_unknown'],\n",
       "  'd_ckId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'd_curPage': ['0'],\n",
       "  'd_pageSize': ['40'],\n",
       "  'd_headId': ['f687b5e8f73707274eb9452147370d58'],\n",
       "  'curPage': [9],\n",
       "  'industryType': ['industry_01'],\n",
       "  'industries': ['040'],\n",
       "  'key': ['用户研究']}}"
      ]
     },
     "execution_count": 26,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 构建参数模板\n",
    "def 参数模板生成(industryType,industries,curPage,key):\n",
    "    参数 = 参数模板.copy()\n",
    "    参数['industryType'] = industryType\n",
    "    参数['industries'] = industries\n",
    "    参数['curPage'] = curPage\n",
    "    参数['key'] = key\n",
    "    return (参数)\n",
    "\n",
    "print (df_qs.curPage_int.min()) # 最小值只有1\n",
    "print (df_qs.curPage_int.max()) # 最大值只有9\n",
    "\n",
    "# 应该是 0 (本页)....9(最大值)\n",
    "\n",
    "参数_key_X_curPage = { \n",
    "    i:参数模板生成(industryType=['industry_01'],\\\n",
    "                       industries = ['040'],\\\n",
    "                      curPage = [i], \\\n",
    "                      key = ['用户研究']) \\\n",
    "    for i in range(0,df_qs.curPage_int.max()+1)\\\n",
    "    }\n",
    "参数_key_X_curPage"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 爬取的数据模板建构"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [],
   "source": [
    "session = HTMLSession()\n",
    "\n",
    "def requests_liepin( url, params):\n",
    "    r = session.get( url , params = payload)\n",
    "\n",
    "    # 先取特定元素, 精准打击其子后辈\n",
    "    主要元素 = r.html.xpath( '//ul[@class=\"sojob-list\"]/li')\n",
    "\n",
    "    # 作为xpath字典，键为我要抓的牛肉名称，值为xpath\n",
    "    dict_xpaths={ \n",
    "        'text': {\n",
    "            '学历':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]',\n",
    "            '经验':      '//div[contains(@class,\"job-info\")]/p/span[@class=\"edu\"]/following-sibling::span',\n",
    "            '薪水':    '//div[contains(@class,\"job-info\")]/p/span[@class=\"text-warning\"]', \n",
    "            '时间':    '//div[contains(@class,\"job-info\")]/p/time/@title', \n",
    "            '职称':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司地点': '//div[contains(@class,\"job-info\")]/p/a',\n",
    "            '公司名称': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        },\n",
    "        'text_content': {\n",
    "        },\n",
    "        'href': {\n",
    "            '链接':    '//div[contains(@class,\"job-info\")]/h3/a', \n",
    "            '公司URL': '//div[contains(@class,\"sojob-item-main\")]//p[@class=\"company-name\"]/a', \n",
    "        }\n",
    "    }\n",
    "\n",
    "    def get_e_text_content(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [e.xpath(_xpath_)[0].lxml.text_content() for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_text(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [\"\".join([x.strip() if type(x) is str else x.text.strip() for x in e.xpath(_xpath_)]) for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    def get_e_href(_xpath_):\n",
    "        # 高级列表推导\n",
    "        暂存结果 = [list(e.xpath(_xpath_, first=True).absolute_links)[0] \\\n",
    "                   if len(e.xpath(_xpath_, first=True).absolute_links) >= 1  \\\n",
    "                   else \"\" for e in 主要元素]\n",
    "        return(暂存结果)\n",
    "\n",
    "    # 只对主要元素下进行.xpath取值\n",
    "    数据字典 = dict()\n",
    "\n",
    "    数据字典 = {k:get_e_text_content(v) for k,v in dict_xpaths['text_content'].items()}\n",
    "    数据字典.update({k:get_e_text(v) for k,v in dict_xpaths['text'].items()})\n",
    "    数据字典.update({k:get_e_href(v) for k,v in dict_xpaths['href'].items()})\n",
    "\n",
    "    数据 = pd.DataFrame(数据字典)\n",
    "    #数据.to_excel(\"20春_Web数据挖掘_week03_liepin.xlsx\", sheet_name=\"搜查结果\")\n",
    "    return (数据)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 数据表输出-变量：行业，翻页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "用户研究 10\n",
      "UI设计 10\n",
      "产品经理 10\n",
      "新媒体运营 10\n",
      "前端开发 10\n",
      "Wall time: 4min 42s\n"
     ]
    }
   ],
   "source": [
    "%%time\n",
    "# 多个页面+多个关键词\n",
    "import time\n",
    "from random import random\n",
    "\n",
    "url = \"https://www.liepin.com/zhaopin/\"\n",
    "xpath_翻页a = '//div[@class=\"pagerbar\"]/a[starts-with(@href,\"/zhaopin\")]'\n",
    "\n",
    "keywords = ['用户研究','UI设计','产品经理','新媒体运营','前端开发']\n",
    "list_df = list()\n",
    "\n",
    "# 选定行业类型为互联网·游戏·软件，行业为互联网/电商\n",
    "for key in keywords:\n",
    "    payload = 参数模板生成(industryType=['industry_01'],industries = ['040'],key=[key], curPage=['0'])\n",
    "    df = requests_liepin( url, params = payload)\n",
    "    href_列表 = [x.xpath('//@href')[0] for x in r.html.xpath(xpath_翻页a)]\n",
    "    df = pd.DataFrame([ urlparse(x) for x in href_列表])\n",
    "    df_qs = pd.DataFrame([{k:v[0] for k,v in parse_qs(x).items()} for x in df['query'] ])\n",
    "    df_qs = df_qs.assign (curPage_int=df_qs.curPage.astype(int)) # 变成整数\n",
    "    长度 = df_qs.curPage_int.max()+1\n",
    "    参数_keyword_X_curPage = { \n",
    "        i:参数模板生成(industryType=['industry_02'],\\\n",
    "                       industries = ['060'],\\\n",
    "                      curPage = [i], \\\n",
    "                      key = [key]) \\\n",
    "        for i in range(0,长度)\\\n",
    "        }\n",
    "    print (key,长度)#10\n",
    "    \n",
    "    for k,v in 参数_keyword_X_curPage.items():\n",
    "        payload = v\n",
    "        df = requests_liepin( url, params = payload)\n",
    "        time.sleep(3+4*random())  #放慢脚步 3-7秒, 平均约5秒\n",
    "        df = df.assign (行业类型 = '互联网·游戏·软件' )\n",
    "        df = df.assign (行业 = '互联网/电商')\n",
    "        df = df.assign (关键词 = key)  # 区分  keyword    \n",
    "        df = df.assign (页数 = k)  # 区分  curPage    \n",
    "        list_df.append(df)\n",
    "        \n",
    "df_all = pd.concat(list_df).reset_index()\n",
    "df_all.index.name = '序'\n",
    "\n",
    "# 数据导出\n",
    "df_all.to_excel(\"20春_Web数据挖掘_liepin_互联网_电商行业_翻页合集.xlsx\",\\\n",
    "                sheet_name=\"_\".join(keywords))\n",
    "# 预估时间: 4*5秒*10 =200\n",
    "# 预估数量: 4*40*10 =1600"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>时间</th>\n",
       "      <th>职称</th>\n",
       "      <th>公司地点</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司URL</th>\n",
       "      <th>行业类型</th>\n",
       "      <th>行业</th>\n",
       "      <th>关键词</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>序</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>25-40k·12薪</td>\n",
       "      <td>2020年07月17日</td>\n",
       "      <td>用户体验研究专家</td>\n",
       "      <td>深圳-龙岗区</td>\n",
       "      <td>兴硕信息科技(上海)有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1928830743.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9408666/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>用户研究</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>2020年07月16日</td>\n",
       "      <td>高级用户体验研究员（用户研究岗）</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>https://www.liepin.com/job/1927446107.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9122701/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>用户研究</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>2020年07月16日</td>\n",
       "      <td>高级用户体验研究员</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>https://www.liepin.com/job/1927446101.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9122701/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>用户研究</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20-35k·12薪</td>\n",
       "      <td>2020年07月16日</td>\n",
       "      <td>用户体验高级研究员</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>https://www.liepin.com/job/1920864427.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9122701/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>用户研究</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>2020年07月16日</td>\n",
       "      <td>用户市场高级研究员</td>\n",
       "      <td>北京-广安门</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>https://www.liepin.com/job/1920864247.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9122701/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>用户研究</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1734</th>\n",
       "      <td>35</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-18k·12薪</td>\n",
       "      <td>2020年01月06日</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>长沙-东屯渡</td>\n",
       "      <td>中兴网信</td>\n",
       "      <td>https://www.liepin.com/job/1915700912.shtml</td>\n",
       "      <td>https://www.liepin.com/company/866312/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>前端开发</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1735</th>\n",
       "      <td>36</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>2019年12月27日</td>\n",
       "      <td>web前端开发工程师(004004)</td>\n",
       "      <td>深圳-福田区</td>\n",
       "      <td>vivo</td>\n",
       "      <td>https://www.liepin.com/job/1919989465.shtml</td>\n",
       "      <td>https://www.liepin.com/company/4787049/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>前端开发</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1736</th>\n",
       "      <td>37</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>2019年12月27日</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>上海</td>\n",
       "      <td>上海铱芯信息科技有限公司</td>\n",
       "      <td>https://www.liepin.com/job/1915468791.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9549866/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>前端开发</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1737</th>\n",
       "      <td>38</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-30k·16薪</td>\n",
       "      <td>2019年12月26日</td>\n",
       "      <td>WEB前端开发工程师</td>\n",
       "      <td>成都</td>\n",
       "      <td>华为技术有限公司成都研究所</td>\n",
       "      <td>https://www.liepin.com/job/1925518261.shtml</td>\n",
       "      <td>https://www.liepin.com/company/9518877/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>前端开发</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1738</th>\n",
       "      <td>39</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>2019年12月24日</td>\n",
       "      <td>WEB 前端开发工程师</td>\n",
       "      <td>深圳</td>\n",
       "      <td>华为</td>\n",
       "      <td>https://www.liepin.com/job/1925485149.shtml</td>\n",
       "      <td>https://www.liepin.com/company/954482/</td>\n",
       "      <td>互联网·游戏·软件</td>\n",
       "      <td>互联网/电商</td>\n",
       "      <td>前端开发</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1739 rows × 14 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "      index     学历     经验          薪水           时间                  职称  \\\n",
       "序                                                                        \n",
       "0         0   统招本科   3-5年  25-40k·12薪  2020年07月17日            用户体验研究专家   \n",
       "1         1  硕士及以上  5-10年  16-32k·13薪  2020年07月16日    高级用户体验研究员（用户研究岗）   \n",
       "2         2  硕士及以上  5-10年  16-32k·13薪  2020年07月16日           高级用户体验研究员   \n",
       "3         3  硕士及以上  5-10年  20-35k·12薪  2020年07月16日           用户体验高级研究员   \n",
       "4         4  硕士及以上  5-10年  16-32k·13薪  2020年07月16日           用户市场高级研究员   \n",
       "...     ...    ...    ...         ...          ...                 ...   \n",
       "1734     35   统招本科   1-3年  10-18k·12薪  2020年01月06日             前端开发工程师   \n",
       "1735     36   统招本科   3-5年          面议  2019年12月27日  web前端开发工程师(004004)   \n",
       "1736     37   统招本科   1-3年  10-15k·12薪  2019年12月27日             前端开发工程师   \n",
       "1737     38  本科及以上   3-5年  15-30k·16薪  2019年12月26日          WEB前端开发工程师   \n",
       "1738     39   统招本科   1-3年  15-30k·12薪  2019年12月24日         WEB 前端开发工程师   \n",
       "\n",
       "        公司地点            公司名称                                           链接  \\\n",
       "序                                                                           \n",
       "0     深圳-龙岗区  兴硕信息科技(上海)有限公司  https://www.liepin.com/job/1928830743.shtml   \n",
       "1         北京   中国移动通信有限公司研究院  https://www.liepin.com/job/1927446107.shtml   \n",
       "2         北京   中国移动通信有限公司研究院  https://www.liepin.com/job/1927446101.shtml   \n",
       "3         北京   中国移动通信有限公司研究院  https://www.liepin.com/job/1920864427.shtml   \n",
       "4     北京-广安门   中国移动通信有限公司研究院  https://www.liepin.com/job/1920864247.shtml   \n",
       "...      ...             ...                                          ...   \n",
       "1734  长沙-东屯渡            中兴网信  https://www.liepin.com/job/1915700912.shtml   \n",
       "1735  深圳-福田区            vivo  https://www.liepin.com/job/1919989465.shtml   \n",
       "1736      上海    上海铱芯信息科技有限公司  https://www.liepin.com/job/1915468791.shtml   \n",
       "1737      成都   华为技术有限公司成都研究所  https://www.liepin.com/job/1925518261.shtml   \n",
       "1738      深圳              华为  https://www.liepin.com/job/1925485149.shtml   \n",
       "\n",
       "                                        公司URL       行业类型      行业   关键词  页数  \n",
       "序                                                                           \n",
       "0     https://www.liepin.com/company/9408666/  互联网·游戏·软件  互联网/电商  用户研究   0  \n",
       "1     https://www.liepin.com/company/9122701/  互联网·游戏·软件  互联网/电商  用户研究   0  \n",
       "2     https://www.liepin.com/company/9122701/  互联网·游戏·软件  互联网/电商  用户研究   0  \n",
       "3     https://www.liepin.com/company/9122701/  互联网·游戏·软件  互联网/电商  用户研究   0  \n",
       "4     https://www.liepin.com/company/9122701/  互联网·游戏·软件  互联网/电商  用户研究   0  \n",
       "...                                       ...        ...     ...   ...  ..  \n",
       "1734   https://www.liepin.com/company/866312/  互联网·游戏·软件  互联网/电商  前端开发   9  \n",
       "1735  https://www.liepin.com/company/4787049/  互联网·游戏·软件  互联网/电商  前端开发   9  \n",
       "1736  https://www.liepin.com/company/9549866/  互联网·游戏·软件  互联网/电商  前端开发   9  \n",
       "1737  https://www.liepin.com/company/9518877/  互联网·游戏·软件  互联网/电商  前端开发   9  \n",
       "1738   https://www.liepin.com/company/954482/  互联网·游戏·软件  互联网/电商  前端开发   9  \n",
       "\n",
       "[1739 rows x 14 columns]"
      ]
     },
     "execution_count": 34,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_all"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "## 数据整理\n",
    "* 代码笔记\n",
    "* [set_index()](https://blog.csdn.net/cuit2016123070/article/details/83624074):\n",
    "  * 可以设置单索引和复合索引\n",
    "  * 函数原型：DataFrame.set_index(keys, drop=True, append=False, inplace=False, verify_integrity=False) \n",
    "  * keys：列标签或列标签/数组列表，需要设置为索引的列\n",
    "  * drop：默认为True，删除用作新索引的列\n",
    "  * append：默认为False，是否将列附加到现有索引\n",
    "  * inplace：默认为False，适当修改DataFrame(不要创建新对象)\n",
    "  * verify_integrity：默认为false，检查新索引的副本。否则，请将检查推迟到必要时进行。将其设置为false将提高该方法的性能\n",
    "* [reset_index()](https://blog.csdn.net/cuit2016123070/article/details/83624074):\n",
    "  * 可以还原索引，重新变为默认的整型索引\n",
    "  * 函数原型：DataFrame.reset_index(level=None, drop=False, inplace=False, col_level=0, col_fill='')\n",
    "  * level：int、str、tuple或list，默认无，仅从索引中删除给定级别。默认情况下移除所有级别。控制了具体要还原的那个等级的索引 \n",
    "  * drop：drop为False则索引列会被还原为普通列，否则会丢失\n",
    "  * inplace：默认为false，适当修改DataFrame(不要创建新对象)\n",
    "  * col_level：int或str，默认值为0，如果列有多个级别，则确定将标签插入到哪个级别。默认情况下，它将插入到第一级。\n",
    "  * col_fill：对象，默认‘’，如果列有多个级别，则确定其他级别的命名方式。如果没有，则重复索引名\n",
    "* [loc()](https://pandas.pydata.org/pandas-docs/stable/reference/api/pandas.DataFrame.loc.html):\n",
    "  * loc函数主要通过行标签索引行数据\n",
    "  * loc中的数据是列名，是字符串，所以前后都要取"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 筛选出用户研究的数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职称</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司地点</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>关键词</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>用户体验研究专家</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>25-40k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1928830743.shtml</td>\n",
       "      <td>深圳-龙岗区</td>\n",
       "      <td>兴硕信息科技(上海)有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>高级用户体验研究员（用户研究岗）</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1927446107.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>高级用户体验研究员</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1927446101.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>用户体验高级研究员</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20-35k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1920864427.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>用户市场高级研究员</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1920864247.shtml</td>\n",
       "      <td>北京-广安门</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>售前经理（云平台）</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1921515331.shtml</td>\n",
       "      <td>武汉</td>\n",
       "      <td>武汉电信实业有限责任公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>广东智慧广电物联网科技有限公司UI交互设计岗</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1922504205.shtml</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>广东省广播电视网络股份有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>物联网公司UI交互设计岗</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1922504203.shtml</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>广东省广播电视网络股份有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>终端产品规划与定制策略</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1916672249.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>天翼电信终端有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>用户研究</th>\n",
       "      <td>数据挖掘</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-16k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1921626551.shtml</td>\n",
       "      <td>上海-漕河泾</td>\n",
       "      <td>亚信科技</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>400 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                          职称     学历     经验          薪水  \\\n",
       "关键词                                                      \n",
       "用户研究                用户体验研究专家   统招本科   3-5年  25-40k·12薪   \n",
       "用户研究        高级用户体验研究员（用户研究岗）  硕士及以上  5-10年  16-32k·13薪   \n",
       "用户研究               高级用户体验研究员  硕士及以上  5-10年  16-32k·13薪   \n",
       "用户研究               用户体验高级研究员  硕士及以上  5-10年  20-35k·12薪   \n",
       "用户研究               用户市场高级研究员  硕士及以上  5-10年  16-32k·13薪   \n",
       "...                      ...    ...    ...         ...   \n",
       "用户研究               售前经理（云平台）  本科及以上   1-3年   8-12k·12薪   \n",
       "用户研究  广东智慧广电物联网科技有限公司UI交互设计岗  本科及以上   1-3年  10-15k·12薪   \n",
       "用户研究            物联网公司UI交互设计岗  本科及以上   1-3年  10-15k·12薪   \n",
       "用户研究             终端产品规划与定制策略  硕士及以上   3-5年          面议   \n",
       "用户研究                    数据挖掘  本科及以上   3-5年  10-16k·12薪   \n",
       "\n",
       "                                               链接    公司地点             公司名称  页数  \n",
       "关键词                                                                             \n",
       "用户研究  https://www.liepin.com/job/1928830743.shtml  深圳-龙岗区   兴硕信息科技(上海)有限公司   0  \n",
       "用户研究  https://www.liepin.com/job/1927446107.shtml      北京    中国移动通信有限公司研究院   0  \n",
       "用户研究  https://www.liepin.com/job/1927446101.shtml      北京    中国移动通信有限公司研究院   0  \n",
       "用户研究  https://www.liepin.com/job/1920864427.shtml      北京    中国移动通信有限公司研究院   0  \n",
       "用户研究  https://www.liepin.com/job/1920864247.shtml  北京-广安门    中国移动通信有限公司研究院   0  \n",
       "...                                           ...     ...              ...  ..  \n",
       "用户研究  https://www.liepin.com/job/1921515331.shtml      武汉     武汉电信实业有限责任公司   9  \n",
       "用户研究  https://www.liepin.com/job/1922504205.shtml  广州-天河区  广东省广播电视网络股份有限公司   9  \n",
       "用户研究  https://www.liepin.com/job/1922504203.shtml  广州-天河区  广东省广播电视网络股份有限公司   9  \n",
       "用户研究  https://www.liepin.com/job/1916672249.shtml      北京       天翼电信终端有限公司   9  \n",
       "用户研究  https://www.liepin.com/job/1921626551.shtml  上海-漕河泾             亚信科技   9  \n",
       "\n",
       "[400 rows x 8 columns]"
      ]
     },
     "execution_count": 39,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_yhyj = df_all[['关键词','职称','学历','经验','薪水','链接','公司地点','公司名称','页数']].set_index(\"关键词\").loc['用户研究']\n",
    "df_yhyj.to_excel(\"用户研究.xlsx\",\\\n",
    "                sheet_name=\"互联网_电商_用户研究\")\n",
    "df_yhyj"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 筛选出ui设计的数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职称</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司地点</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>关键词</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>资深ui设计师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>25-40k·16薪</td>\n",
       "      <td>https://www.liepin.com/job/1930040433.shtml</td>\n",
       "      <td>上海</td>\n",
       "      <td>千云(上海)信息科技有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>UI设计</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1927897597.shtml</td>\n",
       "      <td>镇江</td>\n",
       "      <td>中国联合网络通信有限公司江苏省分公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>初级UI设计师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1926982717.shtml</td>\n",
       "      <td>南京-建邺区</td>\n",
       "      <td>中国联合网络通信有限公司江苏省分公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>ui设计</td>\n",
       "      <td>学历不限</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>6-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925162677.shtml</td>\n",
       "      <td>佛山-顺德区</td>\n",
       "      <td>广东顺德中电信息技术有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>前端界面设计</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-15k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1925495583.shtml</td>\n",
       "      <td>福州-中亭街</td>\n",
       "      <td>金钱猫科技股份有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>GUI视觉创意经理（外销）(004...</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>30-60k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929565837.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>vivo</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>Android开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>8-10k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929564671.shtml</td>\n",
       "      <td></td>\n",
       "      <td>彩讯科技股份有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>java开发</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>6-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1926869813.shtml</td>\n",
       "      <td>西安</td>\n",
       "      <td>国家无线电频谱管理研究所有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>Android系统</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>16-28k·13薪</td>\n",
       "      <td>https://www.liepin.com/a/20637785.shtml</td>\n",
       "      <td>杭州</td>\n",
       "      <td>某科技外包公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>UI设计</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>21-42k·12薪</td>\n",
       "      <td>https://www.liepin.com/a/11975363.shtml</td>\n",
       "      <td></td>\n",
       "      <td>某大型集团公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>400 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                        职称     学历    经验          薪水  \\\n",
       "关键词                                                   \n",
       "UI设计               资深ui设计师  本科及以上  3-5年  25-40k·16薪   \n",
       "UI设计                  UI设计   统招本科  经验不限          面议   \n",
       "UI设计               初级UI设计师   统招本科  1-3年          面议   \n",
       "UI设计                  ui设计   学历不限  经验不限   6-12k·12薪   \n",
       "UI设计                前端界面设计   统招本科  1-3年   8-15k·13薪   \n",
       "...                    ...    ...   ...         ...   \n",
       "UI设计  GUI视觉创意经理（外销）(004...  本科及以上  3-5年  30-60k·12薪   \n",
       "UI设计          Android开发工程师  本科及以上  3-5年   8-10k·12薪   \n",
       "UI设计                java开发  硕士及以上  3-5年   6-12k·12薪   \n",
       "UI设计             Android系统  大专及以上  经验不限  16-28k·13薪   \n",
       "UI设计                  产品经理  本科及以上  3-5年  21-42k·12薪   \n",
       "\n",
       "                                               链接    公司地点                公司名称  \\\n",
       "关键词                                                                             \n",
       "UI设计  https://www.liepin.com/job/1930040433.shtml      上海      千云(上海)信息科技有限公司   \n",
       "UI设计  https://www.liepin.com/job/1927897597.shtml      镇江  中国联合网络通信有限公司江苏省分公司   \n",
       "UI设计  https://www.liepin.com/job/1926982717.shtml  南京-建邺区  中国联合网络通信有限公司江苏省分公司   \n",
       "UI设计  https://www.liepin.com/job/1925162677.shtml  佛山-顺德区      广东顺德中电信息技术有限公司   \n",
       "UI设计  https://www.liepin.com/job/1925495583.shtml  福州-中亭街         金钱猫科技股份有限公司   \n",
       "...                                           ...     ...                 ...   \n",
       "UI设计  https://www.liepin.com/job/1929565837.shtml      深圳                vivo   \n",
       "UI设计  https://www.liepin.com/job/1929564671.shtml                  彩讯科技股份有限公司   \n",
       "UI设计  https://www.liepin.com/job/1926869813.shtml      西安    国家无线电频谱管理研究所有限公司   \n",
       "UI设计      https://www.liepin.com/a/20637785.shtml      杭州             某科技外包公司   \n",
       "UI设计      https://www.liepin.com/a/11975363.shtml                     某大型集团公司   \n",
       "\n",
       "      页数  \n",
       "关键词       \n",
       "UI设计   0  \n",
       "UI设计   0  \n",
       "UI设计   0  \n",
       "UI设计   0  \n",
       "UI设计   0  \n",
       "...   ..  \n",
       "UI设计   9  \n",
       "UI设计   9  \n",
       "UI设计   9  \n",
       "UI设计   9  \n",
       "UI设计   9  \n",
       "\n",
       "[400 rows x 8 columns]"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_ui = df_all[['关键词','职称','学历','经验','薪水','链接','公司地点','公司名称','页数']].set_index(\"关键词\").loc['UI设计']\n",
    "df_ui.to_excel(\"UI设计.xlsx\",\\\n",
    "                 sheet_name=\"互联网_电商_UI设计\")\n",
    "df_ui"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 筛选出产品经理的数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职称</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司地点</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>关键词</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>无线产品解决方案经理</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929524637.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>瑞斯康达科技</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>流量产品经理(003860)</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>50-80k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1930041917.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>vivo</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>10-14k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1930037165.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>北京创联云睿科技有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>海外产品经理(007079)(008006)</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>25-50k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1930035275.shtml</td>\n",
       "      <td>南京</td>\n",
       "      <td>vivo</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>应用分发产品经理（广告方向）(008005)</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>25-50k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1930034961.shtml</td>\n",
       "      <td>深圳-宝安区</td>\n",
       "      <td>vivo</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>产品运营经理</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>20-35k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929727969.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>华为</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>内容平台产品经理(007904)</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>25-50k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929697633.shtml</td>\n",
       "      <td>北京-酒仙桥</td>\n",
       "      <td>vivo</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>产品经理（手机方向）</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-25k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929324909.shtml</td>\n",
       "      <td>深圳-南山区</td>\n",
       "      <td>INNOVATECH</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>12-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929145633.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>畅行神州</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>产品经理</th>\n",
       "      <td>产品经理（急聘）</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20-50k·16薪</td>\n",
       "      <td>https://www.liepin.com/job/1929101239.shtml</td>\n",
       "      <td>南京-雨花台区</td>\n",
       "      <td>华为</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>400 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                          职称     学历     经验          薪水  \\\n",
       "关键词                                                      \n",
       "产品经理              无线产品解决方案经理   统招本科   3-5年  10-20k·12薪   \n",
       "产品经理          流量产品经理(003860)  本科及以上  5-10年  50-80k·12薪   \n",
       "产品经理                    产品经理  本科及以上   经验不限  10-14k·12薪   \n",
       "产品经理  海外产品经理(007079)(008006)  本科及以上   3-5年  25-50k·12薪   \n",
       "产品经理  应用分发产品经理（广告方向）(008005)  本科及以上   3-5年  25-50k·12薪   \n",
       "...                      ...    ...    ...         ...   \n",
       "产品经理                  产品运营经理  硕士及以上   经验不限  20-35k·12薪   \n",
       "产品经理        内容平台产品经理(007904)  本科及以上  5-10年  25-50k·12薪   \n",
       "产品经理              产品经理（手机方向）  本科及以上   3-5年  15-25k·12薪   \n",
       "产品经理                    产品经理  本科及以上   经验不限  12-20k·12薪   \n",
       "产品经理                产品经理（急聘）   统招本科  5-10年  20-50k·16薪   \n",
       "\n",
       "                                               链接     公司地点          公司名称  页数  \n",
       "关键词                                                                           \n",
       "产品经理  https://www.liepin.com/job/1929524637.shtml       北京        瑞斯康达科技   0  \n",
       "产品经理  https://www.liepin.com/job/1930041917.shtml       深圳          vivo   0  \n",
       "产品经理  https://www.liepin.com/job/1930037165.shtml       北京  北京创联云睿科技有限公司   0  \n",
       "产品经理  https://www.liepin.com/job/1930035275.shtml       南京          vivo   0  \n",
       "产品经理  https://www.liepin.com/job/1930034961.shtml   深圳-宝安区          vivo   0  \n",
       "...                                           ...      ...           ...  ..  \n",
       "产品经理  https://www.liepin.com/job/1929727969.shtml       深圳            华为   9  \n",
       "产品经理  https://www.liepin.com/job/1929697633.shtml   北京-酒仙桥          vivo   9  \n",
       "产品经理  https://www.liepin.com/job/1929324909.shtml   深圳-南山区    INNOVATECH   9  \n",
       "产品经理  https://www.liepin.com/job/1929145633.shtml       深圳          畅行神州   9  \n",
       "产品经理  https://www.liepin.com/job/1929101239.shtml  南京-雨花台区            华为   9  \n",
       "\n",
       "[400 rows x 8 columns]"
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_cp = df_all[['关键词','职称','学历','经验','薪水','链接','公司地点','公司名称','页数']].set_index(\"关键词\").loc['产品经理']\n",
    "df_cp.to_excel(\"产品经理.xlsx\",\\\n",
    "                 sheet_name=\"互联网_电商_产品经理\")\n",
    "df_cp"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 筛选处新媒体运营的数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职称</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司地点</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>关键词</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>新媒体运营经理</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-18k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1910288871.shtml</td>\n",
       "      <td>深圳-坂田</td>\n",
       "      <td>深圳鳍源科技有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>新媒体运营经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929930115.shtml</td>\n",
       "      <td></td>\n",
       "      <td>锐捷网络股份有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>7-14k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929881519.shtml</td>\n",
       "      <td>东莞</td>\n",
       "      <td>vivo</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>新媒体运营经理（视频方向）</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1926725231.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>华为</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>新媒体运营经理(004438)</td>\n",
       "      <td>学历不限</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1921886645.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>vivo</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>资深文案</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1919909843.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>海翼电商</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>运营经理</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1919506389.shtml</td>\n",
       "      <td>厦门-集美区</td>\n",
       "      <td>厦门英特易信息科技股份有限公司</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>新媒体项目运营总监</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-20k·14薪</td>\n",
       "      <td>https://www.liepin.com/job/1918970661.shtml</td>\n",
       "      <td>江门</td>\n",
       "      <td>东莞市润熹数码电子有限公司</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>产品营销经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1918488415.shtml</td>\n",
       "      <td>东莞</td>\n",
       "      <td>vivo</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>新媒体运营</th>\n",
       "      <td>市场总监</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1916909311.shtml</td>\n",
       "      <td>厦门</td>\n",
       "      <td>译翼通(厦门)科技有限公司</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>139 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                    职称     学历    经验          薪水  \\\n",
       "关键词                                               \n",
       "新媒体运营          新媒体运营经理  大专及以上  1-3年  10-18k·12薪   \n",
       "新媒体运营          新媒体运营经理  本科及以上  3-5年  15-20k·12薪   \n",
       "新媒体运营          新媒体运营专员  本科及以上  3-5年   7-14k·12薪   \n",
       "新媒体运营    新媒体运营经理（视频方向）   统招本科  经验不限          面议   \n",
       "新媒体运营  新媒体运营经理(004438)   学历不限  3-5年          面议   \n",
       "...                ...    ...   ...         ...   \n",
       "新媒体运营             资深文案  本科及以上  3-5年  15-20k·12薪   \n",
       "新媒体运营             运营经理  大专及以上  3-5年  10-20k·12薪   \n",
       "新媒体运营        新媒体项目运营总监   统招本科  1-3年  10-20k·14薪   \n",
       "新媒体运营           产品营销经理  本科及以上  3-5年  15-30k·12薪   \n",
       "新媒体运营             市场总监  本科及以上  1-3年   8-15k·12薪   \n",
       "\n",
       "                                                链接    公司地点             公司名称  \\\n",
       "关键词                                                                           \n",
       "新媒体运营  https://www.liepin.com/job/1910288871.shtml   深圳-坂田       深圳鳍源科技有限公司   \n",
       "新媒体运营  https://www.liepin.com/job/1929930115.shtml               锐捷网络股份有限公司   \n",
       "新媒体运营  https://www.liepin.com/job/1929881519.shtml      东莞             vivo   \n",
       "新媒体运营  https://www.liepin.com/job/1926725231.shtml      深圳               华为   \n",
       "新媒体运营  https://www.liepin.com/job/1921886645.shtml      深圳             vivo   \n",
       "...                                            ...     ...              ...   \n",
       "新媒体运营  https://www.liepin.com/job/1919909843.shtml      深圳             海翼电商   \n",
       "新媒体运营  https://www.liepin.com/job/1919506389.shtml  厦门-集美区  厦门英特易信息科技股份有限公司   \n",
       "新媒体运营  https://www.liepin.com/job/1918970661.shtml      江门    东莞市润熹数码电子有限公司   \n",
       "新媒体运营  https://www.liepin.com/job/1918488415.shtml      东莞             vivo   \n",
       "新媒体运营  https://www.liepin.com/job/1916909311.shtml      厦门    译翼通(厦门)科技有限公司   \n",
       "\n",
       "       页数  \n",
       "关键词        \n",
       "新媒体运营   0  \n",
       "新媒体运营   0  \n",
       "新媒体运营   0  \n",
       "新媒体运营   0  \n",
       "新媒体运营   0  \n",
       "...    ..  \n",
       "新媒体运营   3  \n",
       "新媒体运营   3  \n",
       "新媒体运营   3  \n",
       "新媒体运营   3  \n",
       "新媒体运营   3  \n",
       "\n",
       "[139 rows x 8 columns]"
      ]
     },
     "execution_count": 47,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_yy = df_all[['关键词','职称','学历','经验','薪水','链接','公司地点','公司名称','页数']].set_index(\"关键词\").loc['新媒体运营']\n",
    "df_yy.to_excel(\"新媒体运营.xlsx\",\\\n",
    "                 sheet_name=\"互联网_电商_新媒体运营\")\n",
    "df_yy"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 筛选出前端开发的数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职称</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司地点</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>关键词</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>移动前端开发工程师</td>\n",
       "      <td>学历不限</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1930032999.shtml</td>\n",
       "      <td>杭州-萧山区</td>\n",
       "      <td>浙江省通信产业服务有限公司文化传媒分公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>15-20k·14薪</td>\n",
       "      <td>https://www.liepin.com/job/1929971663.shtml</td>\n",
       "      <td>成都-高新区</td>\n",
       "      <td>新华三集团</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>web前端开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>12-17k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929399223.shtml</td>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>高新兴智联科技有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>11-22k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1929170057.shtml</td>\n",
       "      <td>济南-高新区</td>\n",
       "      <td>浪潮电子信息产业</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>高级前端开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>7-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1928303553.shtml</td>\n",
       "      <td>合肥-庐阳区</td>\n",
       "      <td>上海汇珏</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-18k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1915700912.shtml</td>\n",
       "      <td>长沙-东屯渡</td>\n",
       "      <td>中兴网信</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>web前端开发工程师(004004)</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1919989465.shtml</td>\n",
       "      <td>深圳-福田区</td>\n",
       "      <td>vivo</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1915468791.shtml</td>\n",
       "      <td>上海</td>\n",
       "      <td>上海铱芯信息科技有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>WEB前端开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-30k·16薪</td>\n",
       "      <td>https://www.liepin.com/job/1925518261.shtml</td>\n",
       "      <td>成都</td>\n",
       "      <td>华为技术有限公司成都研究所</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>前端开发</th>\n",
       "      <td>WEB 前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925485149.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>华为</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>400 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                      职称     学历     经验          薪水  \\\n",
       "关键词                                                  \n",
       "前端开发           移动前端开发工程师   学历不限  5-10年  10-15k·12薪   \n",
       "前端开发             前端开发工程师   统招本科   经验不限  15-20k·14薪   \n",
       "前端开发          web前端开发工程师  本科及以上  5-10年  12-17k·12薪   \n",
       "前端开发             前端开发工程师   统招本科   3-5年  11-22k·13薪   \n",
       "前端开发           高级前端开发工程师  本科及以上   1-3年   7-12k·12薪   \n",
       "...                  ...    ...    ...         ...   \n",
       "前端开发             前端开发工程师   统招本科   1-3年  10-18k·12薪   \n",
       "前端开发  web前端开发工程师(004004)   统招本科   3-5年          面议   \n",
       "前端开发             前端开发工程师   统招本科   1-3年  10-15k·12薪   \n",
       "前端开发          WEB前端开发工程师  本科及以上   3-5年  15-30k·16薪   \n",
       "前端开发         WEB 前端开发工程师   统招本科   1-3年  15-30k·12薪   \n",
       "\n",
       "                                               链接    公司地点  \\\n",
       "关键词                                                         \n",
       "前端开发  https://www.liepin.com/job/1930032999.shtml  杭州-萧山区   \n",
       "前端开发  https://www.liepin.com/job/1929971663.shtml  成都-高新区   \n",
       "前端开发  https://www.liepin.com/job/1929399223.shtml  广州-黄埔区   \n",
       "前端开发  https://www.liepin.com/job/1929170057.shtml  济南-高新区   \n",
       "前端开发  https://www.liepin.com/job/1928303553.shtml  合肥-庐阳区   \n",
       "...                                           ...     ...   \n",
       "前端开发  https://www.liepin.com/job/1915700912.shtml  长沙-东屯渡   \n",
       "前端开发  https://www.liepin.com/job/1919989465.shtml  深圳-福田区   \n",
       "前端开发  https://www.liepin.com/job/1915468791.shtml      上海   \n",
       "前端开发  https://www.liepin.com/job/1925518261.shtml      成都   \n",
       "前端开发  https://www.liepin.com/job/1925485149.shtml      深圳   \n",
       "\n",
       "                      公司名称  页数  \n",
       "关键词                             \n",
       "前端开发  浙江省通信产业服务有限公司文化传媒分公司   0  \n",
       "前端开发                 新华三集团   0  \n",
       "前端开发           高新兴智联科技有限公司   0  \n",
       "前端开发              浪潮电子信息产业   0  \n",
       "前端开发                  上海汇珏   0  \n",
       "...                    ...  ..  \n",
       "前端开发                  中兴网信   9  \n",
       "前端开发                  vivo   9  \n",
       "前端开发          上海铱芯信息科技有限公司   9  \n",
       "前端开发         华为技术有限公司成都研究所   9  \n",
       "前端开发                    华为   9  \n",
       "\n",
       "[400 rows x 8 columns]"
      ]
     },
     "execution_count": 42,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_qd = df_all[['关键词','职称','学历','经验','薪水','链接','公司地点','公司名称','页数']].set_index(\"关键词\").loc['前端开发']\n",
    "df_qd.to_excel(\"前端开发.xlsx\",\\\n",
    "                 sheet_name=\"互联网_电商_前端开发\")\n",
    "df_qd"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### 筛选出广州、深圳的工作数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>关键词</th>\n",
       "      <th>职称</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司地点</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>序</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户体验研究专家</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>25-40k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1928830743.shtml</td>\n",
       "      <td>深圳-龙岗区</td>\n",
       "      <td>兴硕信息科技(上海)有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>高级用户体验研究员（用户研究岗）</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1927446107.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>高级用户体验研究员</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1927446101.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户体验高级研究员</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>20-35k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1920864427.shtml</td>\n",
       "      <td>北京</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户市场高级研究员</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>16-32k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1920864247.shtml</td>\n",
       "      <td>北京-广安门</td>\n",
       "      <td>中国移动通信有限公司研究院</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1734</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-18k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1915700912.shtml</td>\n",
       "      <td>长沙-东屯渡</td>\n",
       "      <td>中兴网信</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1735</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>web前端开发工程师(004004)</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1919989465.shtml</td>\n",
       "      <td>深圳-福田区</td>\n",
       "      <td>vivo</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1736</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1915468791.shtml</td>\n",
       "      <td>上海</td>\n",
       "      <td>上海铱芯信息科技有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1737</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>WEB前端开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-30k·16薪</td>\n",
       "      <td>https://www.liepin.com/job/1925518261.shtml</td>\n",
       "      <td>成都</td>\n",
       "      <td>华为技术有限公司成都研究所</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1738</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>WEB 前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925485149.shtml</td>\n",
       "      <td>深圳</td>\n",
       "      <td>华为</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>1739 rows × 9 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       关键词                  职称     学历     经验          薪水  \\\n",
       "序                                                          \n",
       "0     用户研究            用户体验研究专家   统招本科   3-5年  25-40k·12薪   \n",
       "1     用户研究    高级用户体验研究员（用户研究岗）  硕士及以上  5-10年  16-32k·13薪   \n",
       "2     用户研究           高级用户体验研究员  硕士及以上  5-10年  16-32k·13薪   \n",
       "3     用户研究           用户体验高级研究员  硕士及以上  5-10年  20-35k·12薪   \n",
       "4     用户研究           用户市场高级研究员  硕士及以上  5-10年  16-32k·13薪   \n",
       "...    ...                 ...    ...    ...         ...   \n",
       "1734  前端开发             前端开发工程师   统招本科   1-3年  10-18k·12薪   \n",
       "1735  前端开发  web前端开发工程师(004004)   统招本科   3-5年          面议   \n",
       "1736  前端开发             前端开发工程师   统招本科   1-3年  10-15k·12薪   \n",
       "1737  前端开发          WEB前端开发工程师  本科及以上   3-5年  15-30k·16薪   \n",
       "1738  前端开发         WEB 前端开发工程师   统招本科   1-3年  15-30k·12薪   \n",
       "\n",
       "                                               链接    公司地点            公司名称  页数  \n",
       "序                                                                              \n",
       "0     https://www.liepin.com/job/1928830743.shtml  深圳-龙岗区  兴硕信息科技(上海)有限公司   0  \n",
       "1     https://www.liepin.com/job/1927446107.shtml      北京   中国移动通信有限公司研究院   0  \n",
       "2     https://www.liepin.com/job/1927446101.shtml      北京   中国移动通信有限公司研究院   0  \n",
       "3     https://www.liepin.com/job/1920864427.shtml      北京   中国移动通信有限公司研究院   0  \n",
       "4     https://www.liepin.com/job/1920864247.shtml  北京-广安门   中国移动通信有限公司研究院   0  \n",
       "...                                           ...     ...             ...  ..  \n",
       "1734  https://www.liepin.com/job/1915700912.shtml  长沙-东屯渡            中兴网信   9  \n",
       "1735  https://www.liepin.com/job/1919989465.shtml  深圳-福田区            vivo   9  \n",
       "1736  https://www.liepin.com/job/1915468791.shtml      上海    上海铱芯信息科技有限公司   9  \n",
       "1737  https://www.liepin.com/job/1925518261.shtml      成都   华为技术有限公司成都研究所   9  \n",
       "1738  https://www.liepin.com/job/1925485149.shtml      深圳              华为   9  \n",
       "\n",
       "[1739 rows x 9 columns]"
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_all_1 = df_all[['关键词','职称','学历','经验','薪水','链接','公司地点','公司名称','页数']]\n",
    "df_all_1"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>关键词</th>\n",
       "      <th>职称</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>公司地点</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>产品管理</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-18k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1928958071.shtml</td>\n",
       "      <td>广信通信</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>数据分析师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>10-15k·13薪</td>\n",
       "      <td>https://www.liepin.com/job/1926654193.shtml</td>\n",
       "      <td>亚信科技</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>云平台工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1920032861.shtml</td>\n",
       "      <td>中国联通广东省分公司</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>知乎产品经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>7-9k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1916457809.shtml</td>\n",
       "      <td>联通通信</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>平台产品经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>7-9k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1915612930.shtml</td>\n",
       "      <td>联通通信</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>UI设计</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1916647853.shtml</td>\n",
       "      <td>联通通信</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>新媒体内容运营岗</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>6-8k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1916823547.shtml</td>\n",
       "      <td>中国联通广东省分公司</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>知乎产品经理</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>7-9k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1916718125.shtml</td>\n",
       "      <td>中国联通广东省分公司</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户运营</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>7-9k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1927870601.shtml</td>\n",
       "      <td>彩讯科技股份有限公司</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>NPS用户体验</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>6-7k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1927516021.shtml</td>\n",
       "      <td>彩讯科技股份有限公司</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>维系策划岗</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-14k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1919408355.shtml</td>\n",
       "      <td>中国联通广东省分公司</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>UI设计</td>\n",
       "      <td>UI设计师（外包）</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>8-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929162439.shtml</td>\n",
       "      <td>彩讯科技股份有限公司</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>UI设计</td>\n",
       "      <td>UI设计</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>8-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1916647853.shtml</td>\n",
       "      <td>联通通信</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>UI设计</td>\n",
       "      <td>UI工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>8-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1928536745.shtml</td>\n",
       "      <td>广州市高科通信技术股份有限公司</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>UI设计</td>\n",
       "      <td>客户端开发</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>11-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1927586951.shtml</td>\n",
       "      <td>广信通信</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>UI设计</td>\n",
       "      <td>Android客户端 研发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>11-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925586623.shtml</td>\n",
       "      <td>广信通信</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>UI设计</td>\n",
       "      <td>前台开发（外派）</td>\n",
       "      <td>学历不限</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929724117.shtml</td>\n",
       "      <td>公诚管理咨询有限公司第一分公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>UI设计</td>\n",
       "      <td>ios开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929684589.shtml</td>\n",
       "      <td>彩讯科技股份有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>运营商BSS、OSS产品规划经理产品规划总监（部门负责人）</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>30-50k·15薪</td>\n",
       "      <td>https://www.liepin.com/a/21037937.shtml</td>\n",
       "      <td>广州某物联网，大数据，企业信息化集成商</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>产品经理（海外）</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>18-26k·15薪</td>\n",
       "      <td>https://www.liepin.com/a/21313655.shtml</td>\n",
       "      <td>5G通讯公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>EI产品经理</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>30-40k·15薪</td>\n",
       "      <td>https://www.liepin.com/a/21090013.shtml</td>\n",
       "      <td>某知名互联网公司</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>产品经理</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>18-35k·14薪</td>\n",
       "      <td>https://www.liepin.com/a/21062757.shtml</td>\n",
       "      <td>国内知名通信公司</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>产品经理</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>20-30k·12薪</td>\n",
       "      <td>https://www.liepin.com/a/21062269.shtml</td>\n",
       "      <td>国内知名公司</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>EI产品经理</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>30-60k·16薪</td>\n",
       "      <td>https://www.liepin.com/a/21042967.shtml</td>\n",
       "      <td>某著名互联网公司</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>产品经理（解决方案）</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·14薪</td>\n",
       "      <td>https://www.liepin.com/job/1929573153.shtml</td>\n",
       "      <td>鲁邦通</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>AI硬件产品经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>15-25k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1928314167.shtml</td>\n",
       "      <td>广州慧睿思通信息科技有限公司</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>渠道经理（通信产品方向）</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>7-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925881603.shtml</td>\n",
       "      <td>广州慧睿思通信息科技有限公司</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>产品经理</td>\n",
       "      <td>产品经理+数字广东</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>9-13k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929880887.shtml</td>\n",
       "      <td>彩讯科技股份有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>学历不限</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>4-7k·12薪</td>\n",
       "      <td>https://www.liepin.com/a/21262387.shtml</td>\n",
       "      <td>某知名企业</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>高级新媒体运营专员+五险一金</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>6-8k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1923535393.shtml</td>\n",
       "      <td>广州浚峰网络技术有限公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1922835517.shtml</td>\n",
       "      <td>中国联通广东省分公司</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>运营经理</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-18k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929465949.shtml</td>\n",
       "      <td>广信通信</td>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>中级前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925586825.shtml</td>\n",
       "      <td>广信通信</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>15-20k·13薪</td>\n",
       "      <td>https://www.liepin.com/a/21307835.shtml</td>\n",
       "      <td>知名通讯行业</td>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>web前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>12-20k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1927077159.shtml</td>\n",
       "      <td>广州润芯信息技术有限公司</td>\n",
       "      <td>3</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925248211.shtml</td>\n",
       "      <td>中国联通广东省分公司</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>前端开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>8-13k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1928536743.shtml</td>\n",
       "      <td>广州市高科通信技术股份有限公司</td>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>前端开发工程师（外派驻点）</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>10-15k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1928716185.shtml</td>\n",
       "      <td>彩讯科技股份有限公司</td>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>资深前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1926478309.shtml</td>\n",
       "      <td>爱立信中国</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>前端开发工程师（驻点南航）</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>7-12k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1927913093.shtml</td>\n",
       "      <td>彩讯科技股份有限公司</td>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>WEB前端开发</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>10-13k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1923872747.shtml</td>\n",
       "      <td>中国联通广东省分公司</td>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "        关键词                             职称     学历     经验          薪水  \\\n",
       "公司地点                                                                   \n",
       "广州     用户研究                           产品管理  大专及以上   1-3年  10-18k·12薪   \n",
       "广州     用户研究                          数据分析师   统招本科   3-5年  10-15k·13薪   \n",
       "广州     用户研究                         云平台工程师  本科及以上   经验不限          面议   \n",
       "广州     用户研究                         知乎产品经理  本科及以上   1-3年    7-9k·12薪   \n",
       "广州     用户研究                         平台产品经理  本科及以上   1-3年    7-9k·12薪   \n",
       "广州     用户研究                           UI设计  本科及以上   1-3年   8-12k·12薪   \n",
       "广州     用户研究                       新媒体内容运营岗   统招本科   1-3年    6-8k·12薪   \n",
       "广州     用户研究                         知乎产品经理   统招本科   1-3年    7-9k·12薪   \n",
       "广州     用户研究                           用户运营  本科及以上   1-3年    7-9k·12薪   \n",
       "广州     用户研究                        NPS用户体验  本科及以上   1-3年    6-7k·12薪   \n",
       "广州     用户研究                          维系策划岗   统招本科   1-3年   8-14k·12薪   \n",
       "广州     UI设计                      UI设计师（外包）  本科及以上   经验不限   8-12k·12薪   \n",
       "广州     UI设计                           UI设计  本科及以上   1-3年   8-12k·12薪   \n",
       "广州     UI设计                          UI工程师  本科及以上   经验不限   8-12k·12薪   \n",
       "广州     UI设计                          客户端开发   统招本科   1-3年  11-20k·12薪   \n",
       "广州     UI设计               Android客户端 研发工程师  本科及以上   1-3年  11-20k·12薪   \n",
       "广州     UI设计                       前台开发（外派）   学历不限   经验不限  10-15k·12薪   \n",
       "广州     UI设计                       ios开发工程师  本科及以上   3-5年  15-20k·12薪   \n",
       "广州     产品经理  运营商BSS、OSS产品规划经理产品规划总监（部门负责人）  大专及以上  5-10年  30-50k·15薪   \n",
       "广州     产品经理                       产品经理（海外）   统招本科   经验不限  18-26k·15薪   \n",
       "广州     产品经理                         EI产品经理   统招本科   3-5年  30-40k·15薪   \n",
       "广州     产品经理                           产品经理   统招本科   3-5年  18-35k·14薪   \n",
       "广州     产品经理                           产品经理   统招本科   1-3年  20-30k·12薪   \n",
       "广州     产品经理                         EI产品经理   统招本科  5-10年  30-60k·16薪   \n",
       "广州     产品经理                     产品经理（解决方案）  本科及以上   1-3年  10-15k·14薪   \n",
       "广州     产品经理                       AI硬件产品经理  本科及以上  5-10年  15-25k·12薪   \n",
       "广州     产品经理                   渠道经理（通信产品方向）  大专及以上   3-5年   7-15k·12薪   \n",
       "广州     产品经理                      产品经理+数字广东  大专及以上  5-10年   9-13k·12薪   \n",
       "广州    新媒体运营                          新媒体运营   学历不限   3-5年    4-7k·12薪   \n",
       "广州    新媒体运营                 高级新媒体运营专员+五险一金  大专及以上   1-3年    6-8k·12薪   \n",
       "广州    新媒体运营                          新媒体运营  本科及以上   1-3年  10-15k·12薪   \n",
       "广州    新媒体运营                           运营经理  本科及以上   1-3年  10-18k·12薪   \n",
       "广州     前端开发                      中级前端开发工程师   统招本科   1-3年  10-20k·12薪   \n",
       "广州     前端开发                        前端开发工程师  本科及以上  5-10年  15-20k·13薪   \n",
       "广州     前端开发                     web前端开发工程师   统招本科   1-3年  12-20k·12薪   \n",
       "广州     前端开发                        前端开发工程师   统招本科   1-3年  10-15k·12薪   \n",
       "广州     前端开发                        前端开发工程师  本科及以上   经验不限   8-13k·12薪   \n",
       "广州     前端开发                  前端开发工程师（外派驻点）  大专及以上   经验不限  10-15k·12薪   \n",
       "广州     前端开发                      资深前端开发工程师   统招本科  5-10年          面议   \n",
       "广州     前端开发                  前端开发工程师（驻点南航）  大专及以上   经验不限   7-12k·12薪   \n",
       "广州     前端开发                        WEB前端开发   统招本科   1-3年  10-13k·12薪   \n",
       "\n",
       "                                               链接                 公司名称  页数  \n",
       "公司地点                                                                        \n",
       "广州    https://www.liepin.com/job/1928958071.shtml                 广信通信   1  \n",
       "广州    https://www.liepin.com/job/1926654193.shtml                 亚信科技   3  \n",
       "广州    https://www.liepin.com/job/1920032861.shtml           中国联通广东省分公司   5  \n",
       "广州    https://www.liepin.com/job/1916457809.shtml                 联通通信   6  \n",
       "广州    https://www.liepin.com/job/1915612930.shtml                 联通通信   6  \n",
       "广州    https://www.liepin.com/job/1916647853.shtml                 联通通信   6  \n",
       "广州    https://www.liepin.com/job/1916823547.shtml           中国联通广东省分公司   7  \n",
       "广州    https://www.liepin.com/job/1916718125.shtml           中国联通广东省分公司   7  \n",
       "广州    https://www.liepin.com/job/1927870601.shtml           彩讯科技股份有限公司   7  \n",
       "广州    https://www.liepin.com/job/1927516021.shtml           彩讯科技股份有限公司   7  \n",
       "广州    https://www.liepin.com/job/1919408355.shtml           中国联通广东省分公司   8  \n",
       "广州    https://www.liepin.com/job/1929162439.shtml           彩讯科技股份有限公司   1  \n",
       "广州    https://www.liepin.com/job/1916647853.shtml                 联通通信   2  \n",
       "广州    https://www.liepin.com/job/1928536745.shtml      广州市高科通信技术股份有限公司   4  \n",
       "广州    https://www.liepin.com/job/1927586951.shtml                 广信通信   5  \n",
       "广州    https://www.liepin.com/job/1925586623.shtml                 广信通信   5  \n",
       "广州    https://www.liepin.com/job/1929724117.shtml      公诚管理咨询有限公司第一分公司   9  \n",
       "广州    https://www.liepin.com/job/1929684589.shtml           彩讯科技股份有限公司   9  \n",
       "广州        https://www.liepin.com/a/21037937.shtml  广州某物联网，大数据，企业信息化集成商   0  \n",
       "广州        https://www.liepin.com/a/21313655.shtml               5G通讯公司   0  \n",
       "广州        https://www.liepin.com/a/21090013.shtml             某知名互联网公司   4  \n",
       "广州        https://www.liepin.com/a/21062757.shtml             国内知名通信公司   4  \n",
       "广州        https://www.liepin.com/a/21062269.shtml               国内知名公司   4  \n",
       "广州        https://www.liepin.com/a/21042967.shtml             某著名互联网公司   4  \n",
       "广州    https://www.liepin.com/job/1929573153.shtml                  鲁邦通   6  \n",
       "广州    https://www.liepin.com/job/1928314167.shtml       广州慧睿思通信息科技有限公司   8  \n",
       "广州    https://www.liepin.com/job/1925881603.shtml       广州慧睿思通信息科技有限公司   8  \n",
       "广州    https://www.liepin.com/job/1929880887.shtml           彩讯科技股份有限公司   9  \n",
       "广州        https://www.liepin.com/a/21262387.shtml                某知名企业   0  \n",
       "广州    https://www.liepin.com/job/1923535393.shtml         广州浚峰网络技术有限公司   0  \n",
       "广州    https://www.liepin.com/job/1922835517.shtml           中国联通广东省分公司   1  \n",
       "广州    https://www.liepin.com/job/1929465949.shtml                 广信通信   2  \n",
       "广州    https://www.liepin.com/job/1925586825.shtml                 广信通信   0  \n",
       "广州        https://www.liepin.com/a/21307835.shtml               知名通讯行业   1  \n",
       "广州    https://www.liepin.com/job/1927077159.shtml         广州润芯信息技术有限公司   3  \n",
       "广州    https://www.liepin.com/job/1925248211.shtml           中国联通广东省分公司   4  \n",
       "广州    https://www.liepin.com/job/1928536743.shtml      广州市高科通信技术股份有限公司   4  \n",
       "广州    https://www.liepin.com/job/1928716185.shtml           彩讯科技股份有限公司   5  \n",
       "广州    https://www.liepin.com/job/1926478309.shtml                爱立信中国   6  \n",
       "广州    https://www.liepin.com/job/1927913093.shtml           彩讯科技股份有限公司   6  \n",
       "广州    https://www.liepin.com/job/1923872747.shtml           中国联通广东省分公司   7  "
      ]
     },
     "execution_count": 44,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_gz = df_all_1.set_index(\"公司地点\").loc['广州']\n",
    "df_gz.to_excel(\"广州_用户研究_UI设计_产品经理_新媒体运营_前端开发.xlsx\",\\\n",
    "              sheet_name=\"互联网_电商_广州\")\n",
    "df_gz"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>关键词</th>\n",
       "      <th>职称</th>\n",
       "      <th>学历</th>\n",
       "      <th>经验</th>\n",
       "      <th>薪水</th>\n",
       "      <th>链接</th>\n",
       "      <th>公司名称</th>\n",
       "      <th>页数</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>公司地点</th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户研究分析师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>18-25k·13薪</td>\n",
       "      <td>https://www.liepin.com/a/20505835.shtml</td>\n",
       "      <td>某知名电子高科技公司</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户研究经理(006727)</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929602255.shtml</td>\n",
       "      <td>vivo</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户研究经理（人机交互研究方向）</td>\n",
       "      <td>硕士及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>35-65k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929565887.shtml</td>\n",
       "      <td>vivo</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户研究经理（体验设计方向）</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>经验不限</td>\n",
       "      <td>30-60k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1929309749.shtml</td>\n",
       "      <td>vivo</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>用户研究</td>\n",
       "      <td>用户研究员</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-25k·16薪</td>\n",
       "      <td>https://www.liepin.com/job/1929110707.shtml</td>\n",
       "      <td>传音控股</td>\n",
       "      <td>0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>电商前端开发工程师（SE）-797998869978</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1925825391.shtml</td>\n",
       "      <td>华为</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>web前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>20-40k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1919208423.shtml</td>\n",
       "      <td>OPPO广东移动通信有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>高级前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>5-10年</td>\n",
       "      <td>面议</td>\n",
       "      <td>https://www.liepin.com/job/1915663881.shtml</td>\n",
       "      <td>华为</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>web前端开发工程师</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925675857.shtml</td>\n",
       "      <td>OPPO广东移动通信有限公司</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>深圳</th>\n",
       "      <td>前端开发</td>\n",
       "      <td>WEB 前端开发工程师</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>15-30k·12薪</td>\n",
       "      <td>https://www.liepin.com/job/1925485149.shtml</td>\n",
       "      <td>华为</td>\n",
       "      <td>9</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>217 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "       关键词                          职称     学历     经验          薪水  \\\n",
       "公司地点                                                               \n",
       "深圳    用户研究                     用户研究分析师  本科及以上   3-5年  18-25k·13薪   \n",
       "深圳    用户研究              用户研究经理(006727)  本科及以上   1-3年  15-30k·12薪   \n",
       "深圳    用户研究            用户研究经理（人机交互研究方向）  硕士及以上  5-10年  35-65k·12薪   \n",
       "深圳    用户研究              用户研究经理（体验设计方向）  本科及以上   经验不限  30-60k·12薪   \n",
       "深圳    用户研究                       用户研究员   统招本科   3-5年  15-25k·16薪   \n",
       "...    ...                         ...    ...    ...         ...   \n",
       "深圳    前端开发  电商前端开发工程师（SE）-797998869978  本科及以上  5-10年          面议   \n",
       "深圳    前端开发                  web前端开发工程师   统招本科   3-5年  20-40k·12薪   \n",
       "深圳    前端开发                   高级前端开发工程师   统招本科  5-10年          面议   \n",
       "深圳    前端开发                  web前端开发工程师  本科及以上   3-5年  15-30k·12薪   \n",
       "深圳    前端开发                 WEB 前端开发工程师   统招本科   1-3年  15-30k·12薪   \n",
       "\n",
       "                                               链接            公司名称  页数  \n",
       "公司地点                                                                   \n",
       "深圳        https://www.liepin.com/a/20505835.shtml      某知名电子高科技公司   0  \n",
       "深圳    https://www.liepin.com/job/1929602255.shtml            vivo   0  \n",
       "深圳    https://www.liepin.com/job/1929565887.shtml            vivo   0  \n",
       "深圳    https://www.liepin.com/job/1929309749.shtml            vivo   0  \n",
       "深圳    https://www.liepin.com/job/1929110707.shtml            传音控股   0  \n",
       "...                                           ...             ...  ..  \n",
       "深圳    https://www.liepin.com/job/1925825391.shtml              华为   9  \n",
       "深圳    https://www.liepin.com/job/1919208423.shtml  OPPO广东移动通信有限公司   9  \n",
       "深圳    https://www.liepin.com/job/1915663881.shtml              华为   9  \n",
       "深圳    https://www.liepin.com/job/1925675857.shtml  OPPO广东移动通信有限公司   9  \n",
       "深圳    https://www.liepin.com/job/1925485149.shtml              华为   9  \n",
       "\n",
       "[217 rows x 8 columns]"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_sz = df_all_1.set_index(\"公司地点\").loc['深圳']\n",
    "df_sz.to_excel(\"深圳_用户研究_UI设计_产品经理_新媒体运营_前端开发.xlsx\",\\\n",
    "              sheet_name=\"互联网_电商_深圳\")\n",
    "df_sz"
   ]
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.3"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": true
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
